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7} PRESS SESS ST TSR VSS STS TSS SSAA CEA SESS SESS K SAAS AS SK TASO SES RASPES Tes AAAI SEE 

p OOXXXXXXXXXAXKXX PINE CONTROL OPCODES:! 0000-3fff 

jp TET SSS S PSSA ASKS SL SH SS TEL SSSSLAAOCREST HKG TST SH RKSSEFTTERSEL SEATS LAARTEKCTEELLUARECKeoeAR=E 
;OODDOOOXXXXXxXXxXX, 3.13c, nop 0000-01f¢ 

0000001 Oxxxxxxxx, 3.14, trap 0200-02fE 

10000001 Ixxxxxxxx unused [8] 0300-03ff 

$ 00000 1Oxxxxxxxxx, 3.138, eint 0400-05ff 

7000001 1xxxxxxxxx, 3.13b, dint 0600-07fE 
10000100xiiiiiili, 3. 6b, lpg fimm 0800-09ff 
$0000101xxxxxxxxx unused [9] 0a00-Obf f 

300001 LOAxxxmmNNN, 3.10, norm ax, (Rn}+ 0c00-Odf f 6/8 Rns 
70000111xxxxmmNNN, Pps modr (Rn}+ 0e00-0Of ff 6/8 Rns 
sO001000xiL1itiLi, 3.6a, rep fimn 1000-11ff£ 
;0001001xxxxRRRRR 3.7, rep reg 1200-13ff 31/32 regs 
pOOOLOlOXLiLLLGL, 3.8, bkrep fimm, #flong 1400-15ff£ 
70001011xxxxRRRRR, 3.9, bkrep reg, éf#long 1600-17£EF 31/32 regs 
;O00lixxaffffeccec, 3.12, moda funct, ax, cond 1800-1¢ff£ 13 func 
;00100rrrrrrrecce, 3.1la, callr Str, cond 2000-27ff 
;O010lrrrrrrrecce, 3.ib, bre Str, cond 2800-2f ff 
70011000xxxxxcccc, 3.2a, call tflong, cond 3000-31fE 

30011001 xxxxxcecc, 3.2b, br #ftlong, cond 3200-33ff 
70011010xxxxxcccc, 3.3, ret cond 3400-35ff 

O01 101 Lxxxxxxxxx, 3.4, reti 3600-37££ 
OOLLICOAXXXxXXxXxxX, 3.5, calla axl 3800~-39ff 
FOOLL1O1xxxxxxxxx unused [9] 3a00-3bf £ 

300111 10Aaaaaaaaa, 3.15, divs diradd, ax 3c00-3dff 
pOOLLLLIxxxxxxxxx unused [9] 3e00-3£ FE 

; eB Sh Se ee eh ee E88 88S Be SSR Re SS SSS VSS TA AVS SASS S SISA LIAAVIIS SBT S SS SSIS S= 
FOLXXXXXXXXAXAXAN PINE MOVE OPCODES: 4000-7f fF 

; bt +4 3-4-5 $+ 5 5 5 4 > St Ft +t +t _t_ $4} tf 4-4 4 tt tt tS ty yf tt ts tt tt 4 st $ S 4 t tt te te ty te tS + te 
;0100000AxxxRRRRR, 2.8, movp (axl), reg 4000-41ff 31/32 regs 
70100001ii IT ImmNNN, 2.9, movp (Rn)+, (Ri)+ 4200-43ff 6/8 Rns 
701000 Lxxxxxxxxxx unused [10] 4400-47££ 

; O1O0 LORRRRAmmNNN, 2.3a, mov reg, (Rn)+ 4800-4bff£ 

01001 1RRRRARmmNNN, 2.3b, mov (Rn)+, reg 4c00-4f ff 
;O10LONNNssssssss, 2.7, mov ftimm, Rn* 5000-57ff 
;010110D0D0DSSsssS, 2.5, mov sreg, dreg 5800-Sbff£ 31/32 regs 
pOLOLI1IOxxxxRRRRR, 2.4, mov ffiong, reg $c00-5d ££ 31/32 regs 
POLOLLLUXXXxxxxxx unused [9] 5e00-S5fff 
;0110000Aaaaaaaaa, 2.1b, mov diradd, ax 6000-61£f 
30110001Aasaaasaa, 2.1d, mov diradd, axh 6200-63f£ 
30110010Aasaaaaaa, 2.1c, mov diradd, axl 6400-65ff 

311001 lAaaaaaaaa, 2. le, mov diradd, axh, ev 6600-67f£ 

; 1101NNNaaaaaaaa, 2.6a, mov Rn*, diradd 6800-6fff 
;1LLLONNNaaaaaaaa, 2.6b, mov diradd, Rn* 7000-77££ 
;li110HAaaaaaaaa, 2.1a, mov axH, diradd 7800-7bf f 

pOLILIIOALLALi Lil, 2.248, mov fimm, axl 7c00-7dff 
FOLIIIIIASSssssss, 2.2b, mov #+imm, axh TeO0-7T£EE 

t SPSSPSS TOSS SSS STS SST HS SHRES ITT SKIS AAS O SSO SSA SST ES SSRIRMAES SSS SLSLSSSAOVSESASKSATASTESe 

$ LXXXXXXXAAXXAAKA PINE ALU OPCOOES: 8000-f fff 


S STEMS SSS SSK SSS LESS SASL ARS SAT SESS SHO SSATKARARTTEERAKAATNELSTSESIASESESSSTLAAAATERESLE 


t 

7 1OQOCOOADOXRRRRR, 
7 1OOOOOOADOXRRARR, 
j 1000000A00xRRRRR, 
§ 1000000A00xPRRRR, 
; LOQOOOCADOXRRRRR, 
7 10000xxx01xxxxxx 
3 100010xx01xxxxxx 
$1000110x0)xmmNNN, 
31000111A01xmmNAN, 
7 1001000A01xmmNNN, 
71003001 x01xxxxxx 
$ 100101 xxO1xxxxxx 
71001 1xxx0ixxxxxx 
: 1000000A10xmmNNN, 
+ 1000000A]0xmmNNN, 
7 10Q00000A10xmmNNN, 
t 1OQOOOOALOXmmNNN, 
3 10Co000A10xmmNNN, 
3 1O00000A1L lxxxxxx, 
; LOQOOOLALIXXxxxx, 
; LOQOOLOAL Ixxxxxx, 
;LOOOOLIALIxxxxxx, 
$ 1OODLOOALILXxxxxx, 
;LOOOLOLALIxxxxxx, 
7 LOOOLIxxLixxxxxx 
pLOOlxxxxL1xxxxxx 
3 101l0000Aaaaaaaaa, 
} 10LooocAaaaaaaaa, 


1.34, oper reg, ax 
1.3b, mpy y, reg 

1.3c, mac y, reg, ax 
1.34, sqr reg 

1.3e, sqra reg, ax 
unused [3,6] 

unused [2,6] 

1.6a, mpy (Rn}+t, ttlong 
1.6b, mac (Rn)+, t#long, ax 
1.6c,  msu (Rn)+, ttlong, ax 
unused [1,6] 

unused [2,6] 

unused [3,6] 

1.2a, oper (Rn})+, ax 
1.2b, mpy y, (Rn)+ 
1.2c¢, mac y, (Rn)}+, ax 
1.2d, sqr (Rn)+ 

1.2e, sqra (Rn)+, ax 
1.5a, add tflong, ax 
1.5b, sub fflong, ax 
1.5c, or éflong, ax 
1.5d,  xor #flong, ax 
1.5e, and fflong, ax 
1.5£, | cmp t#long, ax 
unused [2,6] 

unused [4,6] 

lela, oper diradd, sx 
l.lb, mpy y, diradd 


31/32 regs, 6/8 Rns 
6/8 Ras, 31/32 regs 


8000-B801£, 8100-811f 31/32 regs 
8000-801f£, 8100-811f 31/32 regs 
8000-801f, 8100-811f 31/32 regs 
8000-801f, 9100-811f£ 31/32 regs 
8000-801f, 8100-811£ 31/32 reqs 
8040, etc 


8840, 8940, 8a40, 8b40 
8c40-8cSf£, 8d40-Sd5E «6/8 
8e40-8e5f, 8f40-8£5f 6/8 
9040-905f, 9140-913f 6/8 
9240-927£, 9340-937£ 

9440, 9540, 9640, 9740 
9840, etc 


8080-809f, 
8080-809f, 
8080-809f, 
8080-809f, 
8080-809f, 


8180-819f 6/8 
6180-819f 6/8 
8180-819f 6/8 
8189-819f 6/8 
8180-819£ 6/8 


80c0, 81c0 

82¢c0, 83c0 

84c0, 85c0 

86c0, 87c0 

&8c0, 89c0 

8ac0, 8bc0 

8ccO, 8dcO, 8ec0, 8fc0 
9ec0, etc 

a000-bf ff 

a000-bffF 


Rns 
Rns 
Rns 


Rns 
Rns 
Rns 
Rns 
Rns 


} 10loo0c0Aaaaaaaaa, 
3 10lo000Aaaa4aaaaa, 
: 10looooAaaaaaaaa, 
fF LLOOOxxxxxxxxxxx 
$1100 LOxxxxxxxxxx 
71100110x0jjLi01T, 
£11002 10x xxxxxxx 
PLIOOLLIAOZFLLIII, 
pLLOOLL Ix Ixxxxxxx 
#1101000A0j 541i JIT, 
+ LLOLOOOXILxxxxxxx 
71101001 xxxxxxxxx 
SLLOLOIXXXRXXXXXX 
$1101 Uxxxxxxxxxxx 
FLIIOOCOALLILILIL, 
;ll10110Assssssss, 
P1L1011] lxxxxxxxxx 
SLLLUXXxxxxxxxxxx 


l.ic, 
1.1d, 
l.ie, 
unused 
unused 
l.Ja, 
unused 
1.7b, 
unused 
1.7e¢, 
unused 
unused 
unused 
unused 
14a, 
1.4b, 
unused 
unused 


mac y, diradd, ax 
sqt diradd 

sqra diradd, 8% 

{1i] 

[10} 

mpy (RJ)+, (Pi) 
{1,7} 

mac (Rj)+, (Ri), ax 
[1,7] 

msu (Rj)+t, (Ri)+, ax 
{1,7} 

{9] 

{10} 

(11) 

oper fimm, ax 

mpys ttimm, ax 


a0dcd-bf ff 
a000-bf ft 
a000-bf ff 
c000-c7£E 
c800-cbff 
cc00-cceTf, 
cct0-ccff, 
ce00-celf, 
ce80-ceff, 
d000-dO7f, 
dos0-doff, 
d200-d3ff 
a400-d7Tf£f 
d800-dE ff 
e000-ebf f 
ec00-edf f 
ee00-efff 
fOO0-fFfE 


cd00-cd7f 
cd80-cdf f 
cf00-cfTf 
cf80-cfff 
d100-d1i7£ 
d180-ciff 
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16.3 DSP INSTRUCTION SET--execution bus cycle times (0-wait): 








INSTRUCTION DESCRIPTION FLAGS | Reg | Ind | Dir | SIm | LIm 
ax += +0D 
ax +=+op << 16>ax | zveer- | 1 | 1 [| 1 | [| 
paddlop,ax ss ssfax+=op—™~—~—“*‘—‘~iCecEL- [| oT [7 [ 1 TO 
bisep.opyadd loon jo flaca t--- |e | 
Mbradd.[.cond)..- joe =add no eee | 
boc Soft [cond]: | pet or. Serene Te 
| call addf.cond}] | tos=pe:pe=add_ | -------- | od] CT tT 
PeAMacax) = 7 PROS = CL Ne = aki ener ee ee, 
| callr $off[,cond] | tos=pce:pe+=off  |[-------- | fd 
fclraxficond]  _——sfax=0 ———CT -E~- |] fT 
|clrrax[.cond] __—sf ax=0x8000.—“ sid --E-- | 7 ff 
Jompop.,ax  _—s—i{ flags=ax-+op ——s{| zmnvezz- [| 7 [| a | 3 | 1 [| 2 | 
ZMN-—E-~ a ae aS ae ee 
Gt. Se IO ee i eee ee 
|divsdir,ax sd unsigned dividestep | zm--E-- | ss | dT 2 [CU 
Peint eae ae a een oe. i Sa 
‘Ipg#op sd pageregister=op | -------- | 
|mac opl, op2,ax___'| ax+=p:p=opl *op2 | amnvcer- [ 1 [| 1 | 1 | | 2 | 
is ee ee 
| mov sop, dop [,eul_| dop = sop (data space) | -------- | 1 [| 1 [| 1 [| 1 | 2 | 
|movosop.don _—'| dopo = sop (pemspace) | -------- | | 3 [| | | | 
p= (v=op1) * (x=002) | -------- 
|mpvsy.#00. sod | p=v*(x=op) | we | ] 
amnvcrz- | 1 [| 1 | i | | 2 
ax = -ax zmNvcEL- | 1 {| | | | 
no operation Pa------—- | 1 fT 
fnormax.rm  _—sf if !Nax<<=1:modr | amnvcern | 2 [| [| |  |{ 
amn--E~-~ [| J | {| | 
ZMN--E-~ | J 
ax = p + 0x8000 ZMNVCEL- ae re Se: eee ee 
‘repop —Ssd| repeatnextoptimes | -------- | 1 | [| [| 1 [J 
fretf.cond) ss [pc=tos  —————iT ------ | 2 | ft 
Treti—st—t~t~“‘W. COC tosriep flagp=] | -w------ | 2 [| ft ft 
|rndaxficond] __{ ax+=0x8000_—isd| mmvezezx- [| 2 | of TC 
frolax[.cond] _| rotateleftthroughc _| zmn-ce-- [ 17 [ [| | | | 
|rorax[.cond] _[ rotaterightthroughe | zmy-ce-- | 1 [ [| | = =—[ 
[shlax[.cond] ___[ax<<=1] Sst amvecze-- [| 1 fT tT 
amnvez-- [| J [| | | td 
fshrax[.cond] _—[ax>>=1] Cid msocce-- [ 1 [ [| TT 
|shr4axficond] _fax>>=4  —iE ocE-- [| 1 ff 
fsqrop.—“‘C™é*sL i = (y=0p)* (x=0p) [| -------- | 1 oT 1 of ot fl 
|saraop,axs—s«| axt+=o0:p=op*on | zmnvezi- [ 1 [ 1 [ 1 [ | | 
sarsOpD.ax. Ss} ax-=p:p=op*op | zmnvezz- [ 7 [ 7 | 1 [ Jf 
/subh op, ax. ax-=+op<<16 ~~ || aaverz- [| 7 [ 1 | 1 [ [| 
ax -= OD pamveex- [7 [ 1 | 1 [ [| 
Dc: pc = 10: ie=0 ae ee eee eee ee 

xOr OD, ax 7 





z 
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DSP Instruction Set Appendix A 
pacr round product 
Syntax: pacr ax 
Operation: shifted p + 0x8000 -> ax 


Affects flags: 


rep 
Syntax: 


Operand: 


Operation: 


Affects flags: 


ret 


Syntax: 


Operation: 


Affects flags: 


reti 


Syntax: 


Operation: 


Affects flags: 


Z M N V c E L R 


* * * * * * * eis 


repeat next instruction 
rep operand 


#short immediate 
reg (except aX, p) 


Begins a noninterruptible single word 
instruction loop, to be repeated operand + 1 
(le.256) tames:.. 


No 


conditional return from subroutine 
ret [cond] 


T£ condition then 
tos -> pc 


No 


return from interrupt 
retl1 


tos -> pc 
1 -> ie 


No 
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mac multiply and accumulate previous product 

Syntax: mac operandi, operand2, ax 

Operands: y, Girect address 
Va At) 
y, reg (except aX, p) 
(x5), (ry) (XRAM & YRAM) 


(r,), ##long immediate 


Operation: aX + shifted p -> aX 
operandi -> y 
operand2 -> x 


x * Y -> Pp 
Affects flags: Z M N V CC E L 

* x x * * * x as 
moda modify accumulator conditionally 
Syntax: [moda] Function , aX [, cond] 
Operation: Tf condition then 


aX is modified by 'Function' 


Function: shr aX = aX >> 1 
shl aX = aX << 1 
shr4 aX = aX >> 4 
shi4 aX = aX << 4 
ror Rotate aX right through carry 
rol Rotate aX left through carry 
not aX = not (ax) 
neg aX = -ax 
elt aX = 0_ 
Copy aX = ax 
rnd aX = aX + 0x8000 
pacr aX = shifted p + 0x8000 
Cle aX = 0x8000 
Affects flags: According to function, when condition is true. 
modr Modify ry, 
Syntax: modr (r,) 
Operation: Y, 1s modified. 


Affects flags: Z M N V ‘@ E L R 


* 


—_ — omen — — teal —_ 


Note: R flag is set if r, register is zero, otherwise cleared. 
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SECTION 1 
Introduction 





1.1 General Description 


Drive Manager’s DSP (PINE) is a DSP engine for the Adaptec AIC-4411 Drive Manager Chip 
(DMC). It enables low-cost, low-power DSP processing. The core consists of the main blocks of 
a Central Processing Unit (CPU), including the ALU, multiplier, accumulators, RAM and ROM 
addressing units, and the program control logic. 


The DSP consists of three main execution units operating in parallel: the Computation Unit (CU), 
the Data Addressing Arithmetic Unit (DAAU) and the Program Control Unit (PCU). It has two 
blocks of data RAM for parallel feeding of two inputs to the multiplier. The CU has a 16 x 16 mul- 
tiplier, 36-bit ALU, and two 36-bit accumulators. The DSPDSP programming model and instruc- 
tion set are aimed at straight forward generation of efficient and compact code. 


1.2 Document Organization 


The key features of the DSP core are described in Section 2. The core block diagram and detailed 
descriptions of each block are given in Section 3. The DSP instruction set is explained in Section 
4. Section 5 describes the interface to the DSP core for ASIC design purposes, including details on 
clocking, exception handling. 


1.33 Related Documents 


DM_DBG User’s Manual 

DM_ASM and DM_COFEFLINK User’s Manual 

AIC-4411 Drive Manager Chip Data Sheet 

AIC-4411 Drive Manager Chip ROM Code User’s Guide 
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SECTION 2 
Architecture Features 





2.1 Technology Features 


¢ 16x16 bit 2's complement parallel multiplier with 32-bit product. 
e Single cycle multiply/accumulate instructions. 

¢ 36-bit ALU. 

¢ Two 36-bit accumulators. 


¢ On-chip 1Kx16 bit program ROM operation. (See Adaptec’s current “AIC-4411 Drive 
Manager Chip ROM Code User’s Guide” for details.) 


- Diagnostic commands 
- Code download commands 


e¢ 32Kx16 bit maximum addressable off-chip program/data space and 24Kx16 bit maximum 
off-chip program-only memory space. 


¢ Areas of the 32K off-chip program/data memory can be programmed in 8K blocks for 
access using either the RAM_CS or ROM_CS Chip Select signals. 


e 2x256x16 bit on-core data RAM. 


e On-chip 2Kx16 bit ROM and on-chip 2Kx16 bit RAM is accessible via program or data 
buses on the same address space. 


¢ Data RAMs can be also viewed for programmer as a single continuous RAM. 
e 16 level hardware stack. 


e (4+2) x16 bit general purpose pointer-registers with 2 dedicated Address Arithmetic Units 
for data memory (RAM/ROM) indirect addressing, circular buffering, loop counters, and 
program memory indirect addressing. 


e All general and most special-purpose registers are arranged as a global register set of 31 
registers for most data move and ALU instructions. 


e Shifting capability: 


- Accumulator shift +4, +1, -1, -4 
- Accumulator rotate | +1, -l 
- Product register to accumulator +1, 0, -1. 


e 2Kx16 bit common program/data RAM. 
e 2Kx16 bit common program data ROM. 


e Memory mapped I/O space (A000h-BFFFh) configurable to access any 8K-block of entire 
64K off-chip program space, which can be used for Flash chip programming. 
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e Automatic saturation mode on overflow while reading content of accumulators. 


e Zero overhead looping, REPEAT and BLOCKREPEAT instructions with one nesting 
level. 


e Memory mapped I/O. 
e Wait state support for off-chip memory or I/O. 
e STOP mode of operation for stopping the core. 


e Interrupts and exceptions: 

- 1 reset 

- 2 maskable interrupts 

- 1 TRAP (software interrupt) 
e Divide step support. 
e Normalize step support. 
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SECTION 3 
Programming Model 





3.1 General Description 


A high-level block diagram of the DSP architecture is shown in Figure 3-1. The major compo- 


nents of the DSP core are: 


e Data Buses - XDB, YDB, PDB 
e Address Buses - XAB, YAB, PAB 
e Multiplier 

* Input registers -X, Y 

* Output register -P 


* Output shifter 
¢ Data ALU/Shifter 


* Output accumulators - AO, Al 
* Saturation logic - SATU 
e Data Address Arithmetic Unit - DAAU 
* DAAU registers - RO +R3, R4+R5 
* DAAU config. registers - CFGI, CFGJ 
¢ Program Control Unit - PCU 


* Program Add. Arith. Unit - PAAU 
* Program decode controller 
* Interrupt controller 


¢ Memories - XRAM, YRAM, (PROM) 
e Stack 
e¢ Status Registers - STO, ST1, ST2 


e User-Defined Registers (off-core) -EXTO + EXT7 
e Internal Bus Switches 
e Input/Output 
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Figure 3-1 DSP Core Block Diagram 
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3.2 Buses 


3.2.1 Data Buses 


Data is transferred on the following 16-bit buses: a bidirectional X Data Bus (XDB); and two uni- 
directional buses - the Y Data Bus (YDB) and the Program Data bus (PDB). Data transfer 
between the Y Data Memory (YRAM) and the Multiplier (Y register) occurs over the YDB. 
Instruction word fetches take place in parallel over PDB. The bus structure supports register to 
register, register to memory, memory to register and program memory to data memory/register 
data movement. It can transfer up to two 16-bit words in the same instruction cycle. 


3.2.2 Address Buses 


Addresses are specified for the on-chip XRAM and YRAM on two unidirectional buses: the 16 bit 
X Address Bus (XAB), and the 10-bit Y Address Bus (YAB). Program memory addresses are 
specified on the 16-bit unidirectional Program Address Bus (PAB). 


3.3 Computation Unit 


3.3.1 Multiplier 


The multiplier unit consists of a 16x16 to 32 bit parallel, single- cycle, non-pipelined multiplier, 
two 16-bit input registers (X and Y), a 32-bit output register (P), and an output shifter. Together 
with the Data ALU, PINE can perform a single-cycle Multiply-Accumulate (MAC) instruction. 
The P register is updated only after a multiply instructions and not after a change in the X and/or Y 
registers. 


The X and Y registers may be read or written by the XDB, and the Y register by the YDB, as 16- 
bit operands. The 16-bit Most Significant Portion (MSP) of the P register, PH, may be written by 
the XDB as an operand. This enables a single-cycle restore of PH during interrupt service routine. 
The complete 32-bit P register can be used only by the ALU and can be moved only to the two 
accumulators. 


The X and Y registers can be also used as general purpose temporary data registers. 


The (P) register is sign extended into 36 bits and then shifted. 


3.3.2 Data ALU/Shifter 
The Data ALU/Shifter performs all arithmetic, logical and shifting operations on data operands. 


The Data ALU/Shifter consists of a 36-bit, parallel, single-cycle, non-pipelined ALU/Shift unit 
(ALU/S), two 36-bit accumulator registers (AO and A1), and a saturation unit (SATU). 
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The Data ALU/Shifter receives one operand from Ax (x=0,1), and another operand from either the 
output shifter of the multiplier, the XDB (through the bus alignment logic), or from Ax. The 
source operands may be 16 or 36 bits. Operations between the two accumulators are also possible. 
ALUIS results are stored in one of the accumulators. The source and destination accumulator of 
an instruction is always the same. 


The ALU/S can perform positive or negative accumulate, add, subtract, compare, shift, logical, 
and several other operations, most of them in one instruction cycle. It uses a two's complement 
arithmetic. 


Unless otherwise specified, in all operations between the 16-bit operand and Ax (36 bit), the 16-bit 
operand will be regarded as the LSP of a 36-bit operand with a sign extension for arithmetic oper- 
ations and a zero extension for logic operation. The ADDH, SUBH, ADDL and SUBL instruc- 
tions are used when this convention is not adequate in arithmetic operation (refer to these 
instructions in Section 4). 


Registers AxH and AxL can also be used as general-purpose temporary data registers. 


3.4 Data Address Arithmetic Unit (DAAU) 


The DAAU performs all address storage and effective address calculations necessary to address 
data operands in data and program memories. In addition, it supports loop counter operations in 

conjunction with the MODR instruction (see Chapter 4 on Instruction Set) and the R flag (see to 
Paragraph 3.7.2 on Status Registers). This unit operates in parallel with other core resources to 
minimize address generation overhead. The DAAU can implement two types of arithmetic: linear 
and modulo. The DAAU contains six 16-bit address registers (RO-R3 and R4-R5) for indirect 
addressing, and two 16-bit configuration registers (CFGI and CFGJ) for modulo and increment/ 
decrement step control. The registers are divided into two groups for simultaneous addressing 
over XAB and YAB (or PAB): RO-R3 with CFGI; and R4-R5 with CFGJ. Registers from both 
groups can be used for both XAB and YAB (or PAB) for instructions which use only one address 
register. In addition, in these instructions the XRAM and YRAM can be viewed as a single contin- 
uous data memory space. 


All DAAU registers may be read or written by the XDB as 16-bit operands, thus serving as gen- 
eral-purpose registers. 


3.4.1 Address Modification 


The DAAU can generate two 16-bit addresses every instruction cycle which can be post-modified 





_ by two modifiers: linear (step) and modulo modifier. The address modifiers allow the creation of ~~ ~~ 


data structures in memory for circular buffers, delay lines, FIFOs, software stacks, etc. They can 
also be used when the Rn registers are used as loop counters in conjunction with the MODR 
instruction (see Section 4 on Instruction Set) and the R flag of STO (see Section 3.7.2 on Status 
Registers). Address modification is performed using 16-bit (modulo 65,536) two's complement 
linear arithmetic. The range of values of the registers may be considered as signed (from -32,768 
to +32,767) or unsigned (from 0 to +65,536). 


“Ss 
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3.4.1.1 Linear (Step) Modifier 


During one instruction cycle, one or two (from different groups) of the address register, Rn, can be 
post increment/decrement by 1 or by a 2's complement 7-bit step (from -64 to +63). The selection 
of linear modifier type (one out of four) is included in the relevant instructions (see Section 4.2.2 

on Conventions for Instruction set). Step values STEPI and STEPJ are stored as the 7 LSB of the 
configuration register CFGI and CFGJ respectively. 


CFGI 
De. be de. ee i SO 29 8 7 6 5 4 3 2 1 0 


MOD I SE. . a 


CFGJ 
15 14) Ts ta2 11 10.9 8 7 6 > 4 3 2 1 0 


MOD J Sr ee ud 


Figure 3-2 Configuration Registers 
3.4.1.2 Modulo Modifier 


The two modulo arithmetic units can update one or two address registers from different groups 
during one instruction cycle. They are capable of performing modulo calculations of up to 2**9. 
Each register can be set independently to be affected or unaffected by the modulo calculation using 
the six Mn status bits in the ST2 register. Modulo values MODI and MODJ are stored in 9 MSBs 
of configuration registers CFGI and CFGJ respectively. 


For proper modulo calculation, the following constraints must be satisfied (M = modulo factor; q = 
STEPx, +1 or -1): 


1. The lower boundary (base address) must have zeros in at least the k LSBs, where k is the mini- 
mal integer that satisfies 2**k > M-lq| 


2 MODx (x denotes I or J) must be loaded with M-iql. 


M must be an integer multiple of q (this is always true for q=+/-1). 


SS) 


Note: Iqi denotes the absolute value of q. 


The modulo modifier operation, which is a post-modification of the Rn register, is defined as follows: 
Rn <- 0 in k LSB; if Rn is equal to MODx in k LSB and q > 0, 
Rn <- MODx in k LSB; if Rn is equal to 0 in k LSB and g <0, 
Rn <- Rn + q ; Otherwise 


Note: RO-R3 can only work with STEPI and MODI, while R4-R5 can work only with STEPJ and 
MOD]. 


\e 
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Examples: 


1. M=7 with STEPx=1 (or +1 selected in instruction), MODx=7-1=6, Rn=10H (hex). The 
sequence of Rn values will be: 10,11,12,13,14,15,16,10,11.,... 


2 M=8 with STEPx=2, MODx=8-2=6, Rn=10H. The sequence of Rn values will be: 
10,12,14,16,10,12.... 


3  M=9 with STEPx=-3, MODx=9-I-3l=6, Rn=16H. The sequence of Rn values will be: 
16,13,10,16,13.... 


3.5 Program Control Unit (PCU) 


10 


The Program Control Unit (PCU) performs instruction fetch, instruction decoding, exception han- 
dling, and wait state support. In addition, it controls the internal PROM protection (see Section 
3.6.2). 


3.5.1 Program Address Arithmetic Unit (PAAU) 


The Program Address Arithmetic Unit (PAAU) generates the next address to the program memory 
and controls hardware loops. It contains the Repeat/Block-Repeat unit, and two 16-bit directly- 
accessible registers: the Program Counter (PC) and the Loop Counter (LC) of the block-repeat 
unit. | 


The PAAU selects and/or calculates the next address from several possible sources: the incre- 
mented PC in sequential program flow; PROM address in branch or call operations; short PC-rela- 
tive address of 7-bit in relative branch operations; start address of hardware loop; interrupts vector 
in interrupt handling; or the Top of Stack (TOS) upon returning from subroutines and interrupts. It 
also writes the PC to the TOS in subroutines and interrupts. 


The PC always contains the address of the next instruction. 
3.5.1.1 Repeat and Block Repeat Unit 


The Repeat/Block-Repeat unit performs the hardware-loop calculations and control, with no over- 
head other than the one-time execution of set-up instructions REP and BKREP. In block-repeat 
operation, it stores the first and the last addresses of a loop and counts the number of loop repeti- 
tions. It consists of two 16-bit dedicated registers for start and end addresses of the block repeat, 
and two 8-bit repeat and block-repeat counters (1 to 256 repetitions). The start and end address 
registers as well as the 8-bit repeat counter cannot be accessed as registers by the programmer. 
The 8-bit block-repeat counter is the 8 LSB of the LC register, which is one of the global registers. 





occurs. 


Single-level nesting of a single-instruction repeat in the block-repeat instruction is supported. 
Interrupts are disabled only during a single-instruction repeat, and when the instruction is being 
repeated. For details of specific limitations, refer to REP and BKREP instructions in Section 4 on 
the Instruction Set. 
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The number of repetitions can be a fixed value in the instruction code or a value contained in one 
of the processor's 16-bit registers. This supports calculating the number of repetitions in run-time. 


For a clean jump (break) from a block-repeat, a special status bit, In-Loop (LP), is available in 
ST2. It is set when a block-repeat is executed and reset on normal completion of the block-repeat 
loop. The user must reset it when a jump out from the block-repeat loop occurs. See also Section 
3.7.2 on Status Registers. 


If the LP bit is cleared in the block repeat loop and not by one of the two last instructions of the 
loop, the processor is no longer in the loop state. Therefore, there will be no jumps to the first 
address of the loop and the counter will not be decremented. 

If the LP bit is cleared by one of the last two instructions of the loop, its effect will take place only 
in the next loop. (Unless the only instruction in the block repeat loop clears the LP and the LC is 2 
or more, then the loop will be performed 3 times.) 


The LC register may also serve as a general-purpose register for temporary storage. 
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3.6 Memory Spaces and Organization 
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Two independent memory spaces are available: the data space (XRAM and YRAM) and the pro- 
gram space (PROM). Each is 64K words. The addresses from 1000h to 7FFFh access the same 
memory from either the program or data buses. 


3.6.1 Data Memory 


The data space is divided into an X data space for the XRAM (from zero to 64511 <63K-1>), and 
a Y data space for the YRAM (from -1 to -1024). The range of the data space can also be consid- 
ered as unsigned, making the XRAM and YROM spaces continuous. The XRAM space has an 
internal space (on-core data RAM/ROM) of 1K (from 0 to 1023), and an external space of 62K. 
The YRAM space is internal only. See also Figure 3-3. The above data space partition allows 
modular expansion of the on-core XRAM and YRAM, and at the same time enables looking at the 
two RAMs as single continuous data RAM. 


The on-core XRAM and YRAM sizes are at least 2x144x16 bits and can be expanded in 2x64x16 
bit blocks from 2x128x16 bits (i.e. the next size is 2x192x16 bits, the one after that is 2x256x16 
bits, etc.) up to 2x1 Kx16 bits. The XRAM and YRAM can also be expanded by data ROM in 
64x16 bit blocks up to a total (RAM + ROM) of 2x1Kx16 bits. The X data memory can be 
expanded off-core (with no additional wait state cycles) up to the YRAM boundary. 


On-chip DMC peripherals are memory mapped I/O into the data space at address Exxxh. Wait 


state generation can be supported for off-chip memory. (See the current AIC-44XX Drive Manager 
Chip Data Sheet for programming details.) 


—_— ee =e EE eee lee 


i 
OFFFFh 
YRAM (On-Chip) 7 
OFFOOh 


























| 

| 

| | | 

Mem Mapped I/O (On-Chip) : | 
| 08000h | 
Common Prog/Data KRAM | 
(Off-Chip) 02000h | 
Prog/Data ROM (On-Chip) | 
. 01800h | 
Prog/Data RAM (On-Chip) | 
: : : 01000h | 

XRAM (On-Chip) 
00000h | 





Figure 3-3 Data Memory Map 
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3.6.2 Program Memory 


The program space starts at address 00010H. Addresses 0OOOH-0001H are used for Reset; and 
addresses 0008H-OOOFH are used for TRAP, BPI (Breakpoint interrupt), and two maskable inter- 
rupts respectively. Each interrupt address has been separated by two locations so that branch 
instructions can be accommodated in those locations if desired. Addresses 0002H-0007H are 
reserved (see Figure 3-4.). 


The internal PROM is 1K words and can be extended in 1K-word blocks up to 32K words. The 
program space may be expanded off-chip up to 64K words. 


The program memory addresses are generated by the PCU 














FFFFh 
Prog Code Area (Off-Chi 
8 ( P) Off-Chip 
Program 
8000h Daren 
7FFFh 
Prog/Data (Off-Chip) 
2000h 
Prog/Data ROM (On-Chip) 
Prog/Data RAM (On-Chip) 
0400h 
Boot ROM Code (On-Chip) 
| 0010h 
On-Chip 
Interrupt 1 P 
OOOEh I Ogram. 
Memory 
000Ch 
000Ah 
0008h 
0002h 
0000h 


Figure 3-4 Program Memory Map 
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3.6.3 Memory Addressing Modes 


There are two data addressing modes: 


1. Direct Addressing Mode: Eight bits from instruction as LSB plus eight bits from status register 
ST1 (see Section 3.7.2 on Status Registers) as MSB compose the direct address to the Data 
memory. The pages are thus of 256 words each. For example, page 0 is from 0 to 255 in 
XRAM, page 1 is from 256 to 511 in XRAM, and page 255 is from -256 to -1 in YRAM. 


2 Indirect Addressing Mode: The Rn registers of the DAAU are used for indirect addressing to 
the XRAM and YRAM. 


Addressing program memory is accomplished by: 


1. Indirect Addressing Mode: The Rn registers of the DAAU and the accumulator can be used for 
addressing the PROM in specific instructions. 


2 Special Relative Addressing Mode: Special Branch-Relative (BRR) and Call-Relative 
(CALLR) instructions support jumping relative to the PC (from PC-63 to PC+64). 
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3.7 Programming Model and Registers 


All of DSP core’s visible registers are arranged as a global register set of 31 registers, which can be 
accessed by most move and ALU instructions. The registers are listed below, organized according 


to units’ partition. Additional details on each register can be found in the description of each unit 
and in the following paragraphs. 


3.7.1 Programming Model 
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Programming Model (continued) 


PCU REGISTERS: 


15 (] 
PC LT 

1S QO 
NC eee ee 

GENERAL REGISTERS: 

15 0 

sto (| 7 
| 1S 0 
si LF 
1S 0 

sz [7 

15 0 
toss (____—i*”7 
* Up to 16X16-bit stack levels 


USER-DEFINED REGISTERS (Optional Off-Core): 
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3.7.2 Status Registers 


Three status registers are available for flags, status bits, control bits, user I/O bits, and paging bits 
for direct addressing. The contents of each register and their field definitions are described below. 


3.7.2.1 Status Registers Format 


STO 
15. ea -13 e..  O D 


pred eD TD Ded oT] ] eae foe 


Accumulator 0 
Extension Bits 


Zero Interrupt 
; Mask 
Minus 
Normalized Interrupt 
Enable 
Overflow 
Carry Saturation 
Mode 
Extension 
Limit 


Rn is Zero 


ST1 


15. 504: 13: I a. 0. 9 8 7 6 > 4 3 2 a QO 







Accumulator 1 
Extension Bits 


Data Memory Space 
Page 
Shift 
P Register 


Reserved 
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retseore er fofropexfon] oT 0 Jos] fo pa] ea [oo 


Interrupt IUSERI1 
Pending 
Stop IUSERO 
Mode OUSER1 
TEtOor OUSERO 


Notations: * Written as zero, read as don’t care 
Written as don’t care, read as 0 
Not 

Or 

And 

Exclusive-Or 


BOC 


Modulo Enable 
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3.7.2.2 Status Register Field Definition 
Most of the fields can be modified by writing to one of the status registers. 


The flags (Z, M, N, V, C, E, L ) indicate the result of the last ALU operation. At most of the cases 
the ALU output is latched at the destination accumulator, i.e. at most of the cases the flags indi- 
cates the destination accumulator status. 


If an instruction has a different effect than those listed under the status register fields, refer to the 
specific instruction in Section 4. 


STO Register 


Zero (Z) - Bit 11 
Set if the ALU output equals zero; cleared otherwise. 


The zero flag is cleared during processor reset. 
The zero flag can be modified by writing to STO. 


Minus (M) - Bit 10 
Set if ALU output is a negative number; cleared otherwise. The minus flag is the same as the MSB 
of the ALU output (bit 35). 


The minus flag is cleared during processor reset. 
The minus flag can be modified by writing to STO. 


Normalized (N) - Bit 9 
Set if the 32-bit of the accumulator which was the destination at the last instruction is normalized; 
cleared otherwise, 1.e. setif ZU ((bit 31 © bit 30) 7 ~E). 


The normalized flag is cleared during processor reset. 
The normalized flag can be modified by writing to STO. 


Overflow (V) - Bit 8 
Set if an arithmetic overflow (36-bit overflow) occurs after an arithmetic operation; cleared other- 
wise. It indicates that the result of an operation cannot be represented in a 36 bits. 


The overflow flag is cleared during processor reset. 
The overflow flag can be modified by writing to STO. 


Carry (C) - Bit 7 
Set if the result of an add generates a carry, or if the result of a subtract generates a borrow; cleared 


otherwise. It is also affected by the shift and rotate operations in the MODA instruction. 


The carry flag is cleared during processor reset. 
The carry flag can be modified by writing to STO. 
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Extension (E) - Bit 6 7 
Set if bits 35-31 of the ALU output, are not identical; cleared otherwise. It indicates that the result 
of an operation cannot be represented in a 32-bit accumulator. 


The extension flag is cleared during processor reset. 
The extension flag can be modified by writing to STO. 


Limit (L) - Bit 5 

Set if the overflow flag was set (overflow latch) or a limitation-occurred when performing a move 
instruction (MOV) from one of the accumulators (AxH and/or AxL) through the data bus. Other- 
wise it is not affected. 


The limit flag is cleared during processor reset. 
The limit flag can be modified by writing to STO. 


Rn register is zero (R) - Bit 4 
This flag is affected by the MODR and NORM instructions. The R flag is set if the result of the 
Rn. modification operation ( Rn ; Rn+1; Rn-1; Rn+S ) is zero; cleared otherwise. 


Note: If the Modulo is enabled for the specific Rn register, Rn reaches the buffer boundary, and 
the Modulo mechanism sets a OO00O0H value in the register - the R flag is cleared. 


The R flag status is latched until one of the above instructions is used. 


The R flag is cleared during processor reset. 
The R flag can be modified by writing to STO. 


Interrupt Mask (IMO, IM1) - Bits 2, 3 
IMO - Interrupt mask for INTO 

IM1 - Interrupt mask for INT1 

Clear - disable the specific interrupt 

Set - enable the specific interrupt 


The interrupt mask bits are cleared during processor reset. 
The interrupt mask bits can be modified by writing to STO. 


Interrupt Enable (IE) - Bit 1 
Clear - disable all maskable interrupts 


Set - enable all maskable interrupts 


The interrupt enable bit is cleared during processor reset. 


_. The interrupt enable bit can be modified by instructions EINT (enable interrupts), DINT CCIS ADI C cet. tsi ciereemednce 


interrupts), or by writing to STO. 

Saturation Mode (SAT) - Bit 0 

Clear - enable the saturation when transferring the contents of the accumulator onto the data bus 
Set - disable the saturation mode 

The saturation enable bit is cleared during processor reset. 


The saturation enable bit can be modified by writing to STO. 
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ST1 Register 


Shift P register (SP) - Bits 10, 11 
The shift P register bits control the scaling shifter at the P register output. 
SP bits 11, 10: 


SP = 00 no shift 

SP = 01 shift right 
SP = 10 shift left 
SP = 11 Reserved 


The SP bits are cleared during processor reset. 
The SP bits can be modified by writing to ST1. 


RAM Page (PAGE) - Bits 0, 1, 2, 3, 4, 5, 6, 7 
Used for direct address. Refer to Section 3.6.3 on Memory Addressing Modes. 


The PAGE bits can be modified by the LPG instruction or by writing to ST1. 


ST2 Register 


INT PENDING (IPO, IP1) - Bits 14, 15 

IPO - Interrupt pending for INTO 

IP1 - Interrupt pending for INT1 

The interrupt pending bit is set when the corresponding interrupt 1s active. The bit reflects the 
interrupt level regardless of the mask bits. 


The IPx bits are read only. 
STOP (STP) - Bit 13 
Set - stop processing mode (Low-power standby) 


Clear - normal operation 


The STOP bit is cleared during processor reset. 
The STOP bit can be modified by writing to ST2. 


INLOOP (LP) - Bit 12 
Set if a block repeat is executed; cleared by the user or at the end of the block-repeat. 


When transferring data into ST2, the LP bit will be influenced as follows: 
"0" The LP bit is unaffected. 
"1" The LP bit is cleared. 


This bit can be used to break from a block repeat. 


The inloop bit is cleared during processor reset. 
The inloop bit can be cleared by writing to ST2. 


In addition, refer to Section 3.5.1.1 on Repeat and Block-Repeat Unit. 
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IUSERO, TUSER1 (100, 1U1) - Bits 10, 11 
The IUSERx bits are read only and reflect the logic state of the corresponding user input pins. 


OUSERO, OUSER1 (OU0, OU1) - Bits 8, 9 
The OUSER«x bits can be modified by writing to ST2 and define the logic state of the correspond- 
ing user output pins. 


The OUSER«x bits are cleared during processor reset. 
The OUSERx bits can be modified by writing to ST2. 


Modulo set ( M0, M1, M2, M3, M4, MS ) - Bits 0, 1, 2, 3, 4, 5 

Cleared Mn bit - when using the corresponding Rn register, the Rn register will be modified as 
specified by the instruction regardless of the modulo option. 

Set Mn bit - when using the corresponding Rn register, the Rn register will be modified as speci- 
fied by the instruction using the suitable modulo. 


The Mn bits are cleared during processor reset. 
The Mn bits can be modified by writing to ST2. 


3.7.3 Stack 


A hardware stack is connected to the XDB and its top (TOS), and can be accessed as a Last-In- 

_First-Out (LIFO) data register file. The stack is automatically loaded with the PC whenever a sub- 
routine call or an interrupt occurs and popped back on return from subroutine or interrupt, respec- 
tively. 


3.7.4 User-Defined Registers 
The core supports 8 user-definable registers, which can be located on the DMC. This feature 
enables future expansion of the core. These registers appear in the data register fields of all rele- 


vant instructions. With these registers, external computation units can be loaded with data and 
- read at the end of the computation directly into internal registers in single cycle. 


3.8 Input and Output 


Memory mapped I/O is used. 


- Two special input bits and two output bits are available as status bits in status register ST2.Condi- 


tional instructions can be executed according to the two input bits. 
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Instruction Set 





4.1 Introduction 


This chapter provides an overview and detailed description of the DSP instruction set. The chapter 
also gives sufficient information to understand the nature of DSP programming and the capability 
of the instruction set itself. 


4.2 Notation and Conventions 


4.2.1 Notation 


The following notations are used in this chapter: 


Registers: 

rN = Address registers: r0, rl, r2, r3, r4, r5 
rl = Address registers: r0, rl, r2, 13 

rJ = Address registers: r4, r5 

ax = a0 or al 


aX] = Accumulator-low (LSP), x = 0, 1 
aXh = Accumulator-high (MSP), x = 0, 1 
axe = Accumulator extension, x = 0, 1 
ac = a0, al, aoh, alh, a0l, all 


cfgX = Configuration registers of DAAU (MODI or MODJ, STEPI or STEPJ), x =I, J 


tos = Top of stack 
pe = Program counter 
Ic =  =Loop counter 


extX = External registers, X = 0, 1,...7 


reg = a0, al, aOh, alh, al, all, rN, x, y, p or ph, pc, Ic, tos, stO, stl, st2, cfgl, cfgJ, extX 


DSP Core Programmer’s Manual 23 


Instruction Set Section 4 


Address Operands: 


On-chip data RAM/ROM 
Off-chip data RAM/ROM: 
Direct address = Paged direct address of 8 bits (see Chapter 3, Section 3.6.3 on addressing modes) 


Program ROM: 
Address = Unsigned 16 bits (0 to 65535) 
$Offset address = 2's complement 7 bits (-64 to 63 
offset range: -63 to 64) 
Immediate Operands: 
#Short immediate = Unsigned 8 bits (0 to 255) 
#Signed Short immediate =2's complement 8 bits (-128 to 127) 
##Long immediate = 2's complement 16 bits (-32,768 to +32,767 ) 
Assembler syntax: ___ decimal 


Ob___ ,OB____ binary 
Ox___,OX ___ hexadecimal 


When using hexadecimal representation, if the number starts with a letter (A-F), a leading zero 
must be inserted. 


cond - condition field: 


true Always 

eq Equal to zero 

neq Not equal to zero 

gt Greater than zero 

ge Greater or equal to zero 
It Less than zero 

le Less or equal to zero 

nn Normalize flag is cleared 
Vv Overflow flag is set 

C Carry flag is set 

e Extension flag is set 

satel tiestoecusteos VAM TAG 1S SOE cece ce 

nr R flag is cleared 


niuO [USERO input user pin 0 is cleared 
iu0 IUSERO input user pin 0 is set 
iu] IUSER1 input user pin 1 is set 
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Other: 


(x)= The contents of x 


{ } = Optional field at the instruction 
[x] = Specific notes 

-> = Is assigned to 

>> = Shift right 

<< = Shift left 

_ = Not 

- = Or 

_ = And 

Flags Notation: 


The effect of each instruction on the flags is described by the following notation: 
- The flag is affected by the execution of the instruction. 

- The flag is not affected by the instruction. 

lorO The flag is unconditionally set or cleared by the instruction. 


stO bits 11 10 9 8 7 6 > 4 
Flags Z M N V C E L R 


For flag definitions, refer to Section 3.7.2.2 on Status Register Field Definitions. 
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4.2.2 Conventions 
1. The arithmetic operations are performed in 2's complement. 


2 When rN register is used by an instruction, the contents of rN register are post-modified as fol- 


lows: 


Options controlled by instruction: 
rN, rN+1, rN-1, rN+step 
Options controlled by configuration registers CFGx: 
Step size: STEPI, STEPS - 2's complement 7 bits (-64 to 63) 
Modulo size: MODI, MODJ - unsigned 9 bits (1 to 512) 
Options controlled by st2: 
For each rN register it should be defined if MODULO is used or not. 
For using MODI or MODJ the relative Mn bit must be set. 


For more details on the modulo arithmetic unit refer to Section 3.4.1.2 on Modulo Modifier. 
Assembler syntax: (rN) , (rN)+, (rN)- , (fN)+S 


ph (the MSP of the p register) can be write only. The 32-bit p reg is updated after a multiply 
operation and can be read only by transferring it to the ALU, that is, it can be moved into aX or 
be an operand for arithmetic and logic operations. When transferring it into the ALU, it is sign- 
extended to 36 bits. This enables the user to store and restore the p register. 


The p register is used as a source operand for different instructions as follows: as one of the 
reg registers; at moda instruction - PACR function; at multiply instructions where the p register 
is added or subtracted from one of the accumulators. When using the p register as a source 
operand, it always means using the 'shifted p register'. Shifted p register means that the p reg- 
ister is sign-extended into 36 bit and then shifted as defined at the SP field, status register st1. 
In shift right the sign is extended, whereas in shift left a zero is appended into the LSB. The 
contents of the p register remain unchanged. 


All move instructions using the accumulator (@X) as a destination are sign extended. All 
instructions which use the accumulator-low (aXl) as a destination, will clear the accumulator- 
high and the accumulator-extension. Therefore, they are sign extension suppressed. 


Ail instructions using the accumulator-high (aXh) as a destination, will clear the accumulator- 
low and are sign extended. An exception is mov direct address,aXh, {eu}, when moving data 
into accumulator-high can be controlled with sign extension or with sign extension suppressed 
(the accumulator-extension aXe is unaffected). 


In all arithmetic operations between 16-bit registers and aX (36 bits), the 16-bit register will be 
regarded as the 16 low-order bits of a 36-bit operand with a sign extension in the Most-Order- 
Bits. 


It is recommended that the flags be used immediately after the ALU operation or moved into 
AC operations (see restrictions at 11.b). Otherwise, nvely ¢ careful ih prcgralns } 1S requires 


~ (some flags may be changed in the meantime). 


The condition field is an optional field; when the condition is missing then cond = true. 


When transferring data into the hardware stack, the data is transferred to the tos, and the stack 
is pushed down one level. When transferring data out of the hardware stack, the data is copied 
to the destination, and the stack is popped one level. 


10 ALU instruction is one of the following instructions: add, sub, or, and, xor, » cmp, addl, subl, 


addh, subh, moda, norm, mac, msu, sqra, sqrs. 
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11 General Restrictions: 


Instruction Set 


A Arithmetic and logical operations must not be performed with the same accumulator as the 


B_ st0 cannot be used as a source operand after one of the following instructions: 
1. An ALU instruction 
2. An instruction where st0/a0/a0l/a0h is the destination operand 


source (soperand) and the destination (doperand). Example: add a0,a0. 


12 Following the mov operand, pc and movp soperand, pc, a nop instruction must be placed. After 
a move instruction to the pc, the nop instruction is executed. Only then is the pc updated 
according to the move instruction, e.g. performing a jump instruction. When an interrupt 1s 
accepted after a move to pc instruction (jump instruction), the tos contains the destination of the 
jump address. 


4.3 Instruction Set Summary 


The following is a summary of the Pine instruction set organized by instruction group. Page num- 
bers for details of each instruction are shown at the right. 


ARITHMETIC & LOGICAL INSTRUCTIONS 


add Add 
sub Subtract 
or OR 
and AND 
xor Exclusive - OR 
cmp Compare 
addl Add to Low Accumulator 
subl Subtract from Low Accumulator 
addh Add to High Accumulator 
subh Subtract from High Accumulator 
moda Modify Accumulator Conditionally 
norm Normalize 
divs Division Step 
MULTIPLY INSTRUCTIONS 
mpy Multiply 
mac Multiply and Accumulate Previous Product 
msu Multiply and Subtract Previous Product 
mpys Multiply Signed Short Immediate 
sqr Square 
sqra Square and Accumulate Previous Product 
sqrs Square and Subtract Previous Product 
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34) 
35) 
37) 
38) 
38) 
39) 
39) 
_ 40) 
41) 
44) 
45) 


. 46) 
. 47) 
. 48) 
. 48) 
. 49) 
. 49) 
. 50) 
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MOVE INSTRUCTIONS 
mov Move Data 
movp Move Program Memory 
LOOP INSTRUCTIONS 
rep Repeat Next Instruction 
bkrep Block Repeat 


BRANCH / CALL INSTRUCTIONS 


br 
brr 
call 
callr 
calla 


ret 
reti 


Conditional Branch 

Relative Conditional Branch 
Conditional Call Subroutine 

Relative Conditional Call Subroutine 
Call Subroutine at Location Specified 
by the Accumulator 

Return Conditionally 

Return from Interrupt 


CONTROL & MISCELLANEOUS INSTRUCTIONS 


nop 
modr 

-eint 
dint 
trap 
Ipg 


No Operation 
Modify rN 

Enable Interrupt 
Disable Interrupt 
Software Interrupt 
Load the Page Bits 


(p. 51) 
(p. 54) 


(p. 55) 
(p. 56) 


(p. 57) 
(p. 58) 
(p. 58) 
(p. 59) 
(p. 59) 


(p. 60) 
(p. 60) 


(p. 61) 
(p. 61) 
(p. 62) 
(p. 62) 
(p. 63) 
(p. 63) 


Section 4 
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4.4 Instruction Set Details 


This section provides detailed descriptions of each instruction. It includes instruction syntax, 
description of operation, operand details, effect on flags, number of execution cycles, and other 
relevant notes and exceptions. 


The instructions are organized according to the groups listed in the summary in Section 4.3. 


4.4.1 Arithmetic and Logical Instructions 


add Add 


add operand , ax 


Operation: ax + operand -> aX 
Source Source Destination 
operand 1 operand 2 operand 


The instruction has two source operands which are added at the ALU, the 
ALU output is latched at the destination operand. 


The flags are affected according to the ALU output, in this instruction 
it reflects the status of the destination accumulator. 


Affects flags: Z M N V C EB L R 


* * * * * * * = 
Cycles: al 

2 when the operand is ##long immediate 
Words: Bf 

2 when the operand is ##long immediate 


'aX' means one of the accumulators a0 or al. This accumulator is both 
source operand and destination operand. 


The 'Operand' field is the other source operand, added at this instruc- 
tion and can be one of the following options - 


operand: reg 
#short immediate 
##long immediate 
(xN) 
direct address 
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reg - is one of the 31 Pine registers : a0, al, aOh, aih, a0Ol, ail, rn, 
Xx, YY, PB, pe, lic, tos, st0O, stl, st2, cfgI, cfgJ, extX. The contents of 
the source register is added to the accumulator. The operation result, 
the ALU output, is placed at the accumulator. | 


Example: 


add ri,a0 
Before execution After execution 
a0 1001H 1008H 


ri 7H 7 


| i 


Short Immediate - the 8-bit (positive number) is one of the source oper- 
ands. The 8-bit value is added, right-justified, to the accumulator. The 
operation result, the ALU output, is placed at the accumulator. 


Example: 


add #255,a0 
Before execution After execution 


a0 LOOL 


1256 


Long Immediate - the 16-bit value is one of the source operands. The 16- 
bit value is added, right-justified and sign-extended, to the accumula- 
tor. The operation result, the ALU output, is placed at the accumulator. 


E.g. 


add ##0OFFFFH,al 
Before execution After execution 


al 20H 1FH 
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(rN) - is indirect addressing. 


Source operand Data location 
» CTO ha 
rN - 16 bit 


One of the DAAU registers (r0, rl, r2, r3, r4, r5) points to one of the 
64k data words. The data location contents, pointed by the register, is 
the source operand - added to the accumulator. The operation result, the 
ALU output, is placed at the accumulator. 


The rN register is modified after the instruction is executed as follows: 


(rN) - no update 

(rN) + - ¥xN is autoincrement 

(rN) - - rN is autodecrement 

(cN)+S - xrN is autoincrement/autodecrement by the offset S 


Fach of these modifications can use the MODULO option. 


For further details regarding the postmodification, see section 4.2.2 
22) 2 


Example: 
add (r1)+S,a0 
Before execution After execution 


aQ 1001H 1101H 


ri. o 9 


Data location 7H 100H 100H 


CFJI meaning S=2 2 5 


st2 meaning no XXX0OH XXX0OH 


modulo option for rl 
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Direct Address - 


The data location, one of the 64k data words, is one of the source oper- 
ands. The 16-bit data location is composed of the page number at stil reg- 
ister and the ‘direct address' field - the offset at the page. The data 

location contents is added to the accumulator. The operation result, the 

ALU output, is placed at the accumulator. 


8 LSBs of stl ‘direct address’ field 
Page number Offset at Page Data location 
8 bit 8 bit 
Example: 
add 2,al 
Before execution After execution 


al OFPFFFFFFFH OH 


stl meaning page 1 OF301H 301H 


Data location 102H 1H 1H 
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sub Subtract 


sub operand , 


Operation: 


ax 


Instruction Set 


aX - operand -> ax 


operand: 


Affects flags: 


Cycles: 


Words: 


Z 


* 


ND FN 


reg 
(rN) 

direct address 
#short immediate 
##long immediate 


when the operand is ##long immediate 


when the operand is ##long immediate 
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or OR 


or operand , aX 


Operation: If operand is aX or p 
aX[bits 35-0] OR operand -> ax[bits 35-0] 


If operand is reg, (rN), 
short immediate, long immediate 
aX{bits 15-0] OR operand -> axX{bits 15-0] 
aX[bits 35-16] -> axX[bits 35-16] 


Clarification: If the operand is one of the accumula- 
tors or the p register, it is ORed with the destina- 
tion accumulator. | 


If the operand is a 16-bit register or an immediate 
value, the operand is zero-extended to form a 36 bits 
operand, then ORed with the accumulator. Therefore, 
the upper bits of the accumulator are unaffected by 
this instruction. 


operand: reg 
(rN) 
direct address 
#short immediate 
##1long immediate 


Affects flags: 2Z M N V C E L R 


* * * pa -_ * = en 
Cycles: 1 

2 when the operand is ##long immediate 
Words 1 

2 when the operand is ##long immediate 


34 DSP Core Programmer’s Manual 


Section 4 Instruction Set 


and AND 


and operand , ax 


Operation: If operand is aX or P 
aX[bits 35-0] AND operand -> axX[bits 35-0] 


If operand is short immediate 
aX{bits 7-0 ] AND operand -> ax[bits 7-0] 
aX[bits 15-8] -> axX[bits 15-8] [1] 
QO -> aX[bits 35-16] 


If operand is reg, (rN), long immediate 
aX[bits 15-0] AND operand -> axX{bits 15-0] 
0 -> aX[bits 35-16] 


Clarification: If the operand is one of the accumulators or 
the p register it is ANDed with the destination accumulator. 


If the operand is short immediate, the operand is zero- 
extended to form a 36-bit operand, then ANDed with the desti- 
nation accumulator. Bits 15-8 are unaffected; other bits of 
the accumulator are cleared. [1] 


If the operand is a 16-bit register or a long immediate 
value, the operand is zero-extended to form a 36-bit oper- 
and, then ANDed with the accumulator. Therefore, the upper 
bits of the accumulator are cleared by this instruction. 


operand: reg 
(xN) 
direct address 
#short immediate 
##long immediate 


Affects flags: 2 M N V C E L R 


* * * ra i * = _ 


Z flag is set if all the bits at the ALU output are zeroed, 
otherwise cleared. Note: when the operand is short immedi- 
ate, ALU output is bit[35:8] = 0, bits[{7:0] = aX[7:0] AND 
operand. 


Cycles: ‘ 
2 when the operand is ##long immediate 


Words: 1 


bo 


when the operand is ##long immediate 
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and AND _ (continued) 


[1] 


36 


The instruction and #short immediate, aX can be used for clearing 
some of the low-order bits at a 16-bit destination. 


For example: mov ram, aX 
and #short immediate, aX 
mov ax, ram 


Using the and instruction, bits 15-8 are unaffected, therefore the 
high-order bits at the destination do not change. 


In addition, this instruction can be used for BIT TEST, test one of 
the low-order bits of a destination. 


For example: mov ram, aX 
and #short immediate, aX 
br address,eg or br address,neq (check 
the zero flag) 
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xor Exclusive - OR 


xor operand , ax 


Instruction Set 


Operation: If operand is aX or p 
aX[bits 35-0] XOR operand -> aX[bits 35-0] 


If operand is reg, (rN), 


Clarification: 


operand: reg 


(rN) 


short immediate, long immediate 
aX[bits 15-0] XOR operand -> ax[{bits 15-0] 
aX[bits 35-16] -> axX[bits 35-16] 


If the operand is one of the accumulators or the p 
register it is Exclusive-ORed with the destination 
accumulator. 


If the operand is a 16-bit register or an immedi- 
ate value, the operand is zero-extended to form a 
36 bits operand, then Exclusive-ORed with the 
accumulator. Therefore, the upper bits of the 
accumulator are unaffected by this instruction. 


direct address 
#short immediate 


##long 


Affects flags: Z 


* 


Cycles: d: 
2 
Words: A; 
2 
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immediate 


N V C E L R 


* = aes * = _ 


when the operand is ##long immediate 


when the operand is ##long immediate 
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cmp Compare 
cmp operand , aX 
Operation: aX - operand 
operand: reg 
(rN) 
direct address 
#short immediate 


##long immediate 


Affects flags: Z M N V c E L R 


* * * * * * * = 


Cycles: it 
2 when the operand is ##long immediate 


Words: 1 


BO 


when the operand is ##long immediate 


addl Add to Low Accumulator 


addl operand , ax 


Operation: aX + operand -> ax 
The operand is sign-extension suppressed. 


operand: (rN) 
direct address 


reg [1] 


Affects flags: 2 M N V C E L R 


* * * * * * * - 


Cycles: i 


Words: i 


{1) The reg cannot” be: aX,” pe. 
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subl Subtract from Low Accumulator 
subl operand , ax 


Operation: aX - operand -> ax 
The operand is sign-extension suppressed. 


operand: (rN) 
direct address 


reg [1] 


Affects flags: Z M N V C E L R 


* * * * * * * = 


Cycles: 1 
Words: ul 


[1] The reg cannot be: ax, p. 


addh Add to High Accumulator 


addh operand , ax 


Operation: aX + operand*2*%16 -> ax 
The aXl is unaffected. 


operand: (rN) 
direct address 


reg (1] 


Affects flags: Z M N V Cc E L R 


* * * * * * * =o 


Cycles: 1 
Words: al 


[1] The reg cannot be: ax, p. 
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~subh Subtract from High Accumulator 


subh operand , ax 


Operation: aX - operand*2%16 -> aX 
The aXl is unaffected. 


operand: (rN) 
direct address 


reg [1] 


Affects flags: Z2 M N V C 


* * * * * 


Cycles: 1 
Words: 1 


[1] The reg cannot be: ax, p. 
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moda Modify Accumulator Conditionally 
moda func , aX , { cond } 
Operation: If condition then aX is modified by ‘func' 


The accumulator and the flags are modified according 
to the function field only when the condition is met. 


SHR 
SHL 
SHR4 
SHL4 
ROR 
ROL 
NOT 
NEG 
CLR 
COPY 
RND 


func: 


PACR 
CLRR 


Affects flags: 
Cycles: Al 
Words: 1 


[1] 


stl. 


[2] 
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aX = ax >> 
aX = ax << 
aX = aX >> 
aX = aX << 4 

Rotate aX right through carry 
Rotate aX left through carry 


Pp 


aX = not (ax) 

aX = -ax 

aX = 0 

aX = ax 

Round upper 20 bits of the ax 
aX = aX+8000H 

aX=shifted p + 8000H [1] 

aX = 8000H 


See below. 


Shifted p register means that the p register is sign-extended to 36 
bits and then shifted as defined at the SP field, 


status register 


At assembler syntax the moda can be omitted. 
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moda Modify Accumulator Conditionally (continued) 
SHR, SHR4 


Shift right step 


PET TEEPE EIEET TT TTT 
axe axh aXl 


Affects flags: Z M N V C E L R 


* x 


+ 
-) 

+ 

+ 

{ 

| 


C - Set according to the LSB (SHR bit 0, 
SHR4 bit 3) shifted out of the operand. 


SHL, SHL4 


Shift left step 


PT LTTILEL IE TET EILEL TTT TT 
axe axh | aXl | 


Affects flags: Z M N V es E L R 


* * * * * * = —_ 


C - Set according to the MSB (SHL bit 35, SHL4 bit 32) 
shifted out of the operand. 


V - Cleared if the operand being shifted could be repre- 


sented in 35 bits for SHL / in 31 bits for SHL4, set 
otherwise. 


ROR 


EERREEEE 


aX1 


TUT ILE ETT TT 


axh 








Affects flags: Z M N V C E L R 


C - Set according to the LSB (bit 0) 
shifted out of the operand. 
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moda Modify Accumulator Conditionally (continued) 


ROL 


STEEN T TT ETT | 


axh 








Affects flags: Z M N V G E L R 


C - Set according to the MSB (bit 35) 
shifted out of the operand. 


NOT, COPY, CLR, CURR 


Affects flags: 2Z M N V C E L R 
* * * = = * = = 

NEG, RND, PACR 

Affects flags: Z M N V C E L R 
* * * * * * * mas 
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norm Normalize 
norm ax , rN 


Operation: If N = 0 (aX is not normalized) 
then aX = ax * 2 
N is modified 
else nop 
nop 


This instruction is used to normalize the signed number at 
the accumulator. Affects the rN register. 


Affects flags: 2Z M N V C EB L R 


* * * * * * * * 


R flag is updated in norm instruction ONLY when rN pointer is 
modified. | 


C is set or cleared as at SHL (moda). 
Cycles: 2 
Words: a 
[1] The norm instruction uses the N flag to decide Pe shift or nop. 
Therefore when using norm at the first iteration, the flag must be 


updated according to ax. 


[2] To normalize a number using the norm instruction, the norm instruc- 
tion can be used together with a rep instruction. 


Example: rep #n 
norm aOQ, (x0) + 


Another method is to use the N flag for conditional branch. 


Example: NRM norm ad, (r0)+ 
brr NRM, NN 
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divs Division Step 
divs direct address ,ax 


Operation: aX - (direct address*2%15) -> ALU output 
If ALU output < 0 
then ax aX * 2 
else ax ALU output * 2+ 1 


Affects flags: 2Z M N V Cc E L R 


* * * * 


Cycles: 2 

Words: 1 

[1] The 16-bit dividend is placed at accumulator-low; the accumulator- 
high and the accumulator-extension are cleared. 


The divisor is placed at the direct address. 


For a 16-bit division, divs should be executed 16 times. After 16 
times the quotient is in the accumulator-low and the remainder is 
in the accumulator-high. 


The dividend and the divisor should both be positive. 
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4.4.2 Multiply Instructions 


mpy Multiply 
mpy operandl , operand2 
Operation: operandl -> y [1] 
operand2 -> x 
oF Ve SS 
operandl , operand2: y ; 
4 ' 
Y r 
(OO) 
(XN) , 


Affects flags: No 


Cycles: 1 


2 when the operand is 


Words: 1 


id] 


[2] 


LS] 


2 when the operand is 


Section 4 


Girect address 


(rN) 
reg [2] 
(rI) [3] 


##long immediate 


##long immediate 


##long immediate 


y -> y means that y retains its value. 


The reg cannot be aX, p. 


The multiplication at mpy (rJ),(rI) is between XRAM and 
YRAM only. Where rJ points to YRAM, rI points to XRAM. 
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mac Multiply and Accumulate Previous Product 


mac operandi , operand2 , ax 
Operation: aX + shifted p -> ax 
operandi -> y 
operand2 -> x 
xy => 
operandl , operand2: y ; 
Y , 
Y ’ 
(rJ) , 
(CN) , 


Affects flags: Z M N V C 


* * * * * 


Cycles: 1 


2 when the operand is 


Words: i: 


La) 


[2] 


[3] 


[4] 


2 when the operand is 


Shifted p register means that 
into 36 bits, then shifted by 
ter stil. 


1} 
[2] 


direct address 
(xN) 
reg 
(rT) 
##long 


[3] 
[4] 
immediate 


##long immediate 


##long immediate 


the previous product is sign-extended 
defined at the SP field, status regis- 


y -> y means that y retains its value. 


The reg cannot be ax, p. 


The multiplication at mac (rJ),(rI) is between XRAM and YRAM only. 


Where rJ points to YRAM , 
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msu Multiply and Subtract Previous Product 
msu operandl , operand2 , ax 


Operation: aX - shifted p -> ax [1] 


operandl -> y [2] 
operand2 -> x 
XK Fo Sp 
operandl , operand2: y , direct address 
Y ; (en) 
y ae 1° Re 
(rJ) , (xI) [4] 


(rN) , ##long immediate 


Affects flags: 2 M N V C E L R 


* * * * * * * 


Cycles: 1 
2 when the operand is ##long immediate 


Words: 1 
2 when the operand is ##long immediate 


[1] Shifted p register means that the previous product is sign-extended 
into 36 bits, then shifted as defined by the SP field, status reg- 
ister stl. 


[2] y->y means that y retains its value. 
[3] The reg cannot be ax, p. 


[4] The multiplication at msu (rJ),(rI) is between XRAM and YRAM only. 
Where rJ points to YRAM , ri points to XRAM. 


mpys Multiply Signed Short Immediate 


mpys y, #signed short immediate 


Operation: #signed short immediate -> x 


a) =o Dp 
Affects flags: No 
Cycles: iL 


Words: x 
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sqr Square 
sqr operand 
Operation: operand -> y 
operand -> x 
y x => Dp 
operand: (rN) 
reg [1] 
direct address 
Affects flags: No 
Cycles: a 


Words: 1 


[1] The reg cannot be ax, p. 


sqra Square and Accumulate Previous Product 
sqra operand ,ax 
Operation: aX + shifted p -> ax [1] 
operand -> y 
operand -> x 
YF SSD 
operand: (rN) 
reg EZ | 


direct address 


Affects flags: Z M N V C E L R 


x * x * * x x ss : 

Cycles: 1 

Words: 1 

[1] Shifted p register means that the previous product is sign-extended 
into 36 bits, then shifted as defined by the SP field, status regis- 


ter stl. 


[2] The reg cannot be ax, p. 
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sqrs Square and Subtract Previous Product 
sqrs operand , ax 
Operation: aX - shifted p -> aX ay 
operand -> y 
operand -> x 
y * X -> Dp 
operand : (rN) 
reg [2] 


direct address 


Affects flags: 2 ™M N V C E L R 


* * * * * * * ae 
Cycles: L 
Words: al 


[1] Shifted p register means that the previous product is sign-extended 
into 36 bits, then shifted as defined by the SP field, status regis- 
ter stl. 


[2] The reg cannot be ax, p. 
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4.4.3 Move Instructions 


mov Move Data 


mov soperand , doperand 


Operation: soperand -> doperand 
soperand , doperand reg ~~ xeG ee ee ee re a ee 
Leg , (rN) (Ade bo e163 
(rN) , reg [4], [5], [6] 
rN , direct address 
aXl , direct address 
axh , direct address 
Y , direct address 
Xx  , dalLrect address 


direct address , rN 

direct address , y 

direct address , x 

direct address , ax 

direct address , axl 

direct address , axh , {eu} [7] 
##long immediate , reg ay 
#short immediate , axl 

#Ssigned short immediate , axXh 
#signed short immediate , rN [8] 
#signed short immediate , y [8] 
#signed short immediate , x [8] 


Affects flags: No effect when doperand is not ac, st0 or when soperand 
is not aXl, axh 


When soperand is aXl or axh: 


When doperand is ac: 


Z M N V C E L R 


* * * ee = * = is [7] 


If doperand is st0, the instruction affects all the 
flags. 


Cycles: Af 
2 when the operand is ##long immediate 


Words: 1 
2 when the operand is ##long immediate 
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mov Move Data (continued) 


[1] The 32-bit p register can be transferred only to aX (mov p,ax ) 
ph is a write-only register, therefore soperand cannot be ph. 


[2] The 36-bit aX can be a soperand only with the following instruc- 
tions: mov a0,al ; mov al,aod. 


[3] With mov reg, the soperand cannot be the same as the doperand. 


[4] When the operand reg is the pe register, a nop instruction must be 
placed after the mov soperand,pc instruction. 


[5] No mov's are permitted between off-core memory and external regis- 
ters and vice versa. This means that mov extX, (rN) , mov (rN),extX 
rN can only point with internal RAM. 


[6] It is not permitted to move data from RAM address pointed by one of 
the rN registers to the same rN register (and vice versa) with post 
modified. 


[7] The eu field is an optional field. 


eu = accumulator extension is unaffected (sign extension sup- 
pressed) 


Instruction Accumulator Content 
Fields After The Instruction 
Ball Balt inne bits | 16 eget 16 — 


sign-extended Sign-extended DATA 























Pe clear clear DATA 
axh sign-extended DATA clear 
axh eu unaffected DATA clear 


The flags after executing mov direct address, axh, eu are the same 
as after executing mov direct address,axh. 


[8] Loading the doperand by short immediate number with sign- extension. 
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mov Move Data (continued) 
[9] Conventions: 


The instruction at PROM address 0100H mov pc,ram 


After execution (ram) =0101H 


mov (rQ0),xr0 


Before execution After execution 


RAM address 20H 1000 1000 
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movp Move Program Memory 

movp soperand , doperand 

Operation: soperand points to PROM -> doperand 
Move a word from Program ROM pointed by soperand to RAM or 
to reg pointed by doperand. When using aX as a soperand, 


the address is defined by accumulator-low. 


soperand , doperand: (aX) , reg (2) 
(CN) , (xT) 


Affects flags: No effect when doperand is not ac, st0. 
When doperand is ac: 
Z M N V c E L R 
If the doperand is st0O, the instruction affects all the 
flags. 
Cycles: 3 
Words: i: 


[1] When the operand reg is the pc register, a nop instruction must be 
placed after the movp (aX),pc instruction. 
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rep Repeat Next Instruction 
rep operand 


Operation: Begins a Single word instruction loop that is to be 
repeated operand+1 times. 


Repetition times is between 1 to 256. The rep instruction 
and the instruction being repeated are not interruptable. 


operand: #short immediate 
reg [1] 


Affects flags: No 

Cycles: L 

Words: HE 

fl] The reg cannot be aX, p. 


[2] When using reg as an operand, the number of times the instruction 
is to be repeated is defined by the low-order 8 bits of the reg. 


[3] Any instruction that breaks the program address continuity cannot 
be repeated. ( brr, callr, movp, trap, ret, reti, mov operand,pc 


,rep, calla) 


[4] rep can be performed inside block-repeat (bkrep). 
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bkrep Block Repeat 


bkrep operand , add 


Operation: operand -> lc [1] 


1 -> LP status bit 


Begins a block repeat that is to be repeated operand+1 
times. 


The number of repetitions ranges from 1 to 256. 


The first block address is the address after the bkrep 
instruction, and the last block, address is the address 
specified by the '‘add' field. [2] 


The operand is inserted into the loop counter lc regis- 
ter. The inloop status bit LP is set - enable block 
repeat. 


The repeated block is interruptable. 


operand: #short immediate 
reg boo C4) 


Affects flags: No 


Cycles: 2 


Words: 2 


[1] 


[2] 


[3] 


[4] 


15] 


[6] 


[7] 


When using #short immediate as an operand, it is copied to the low- 
order’ 6 bits of the Le. the high-order 8 bits are undefined. 


In case the last instruction at the block repeat is: 


a. One word instruction - 'add' is the address of this instruction. 
b. Two words instruction - ‘add' is the address of the second word 


of the instruction. 
When using reg as an operand the 16 bit register is transferred into 
the lc. The number of times the block is to be repeated is defined 
only by the low-order 8 bits. 


The reg cannot be aX, p, pec. 


When the block repeat is completed, the low-order 8 bits of the lc 


register contains OFFH; the high-order 8 bits are unaffected. 
The block repeat length can be one instruction. 


If a mov st2, doperand is performed one instruction prior last 
instruction of the loop, the value of the LP bit undefined. 
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bkrep Block Repeat (continued) 
[8] Restrictions: 
1. The last two instructions of the bkrep loop cannot be br, brr, 
call, callr, calla, trap, mov soperand, pc, movp soperand, pc, 


ret, reti, rep, bkrep. 


2. During a block-repeat loop there can be no jumps to the last 
address of the loop. Forbidden jumps are: 


brr, br, call, callr, calla, ret, reti, mov soperand, pc, 
movp soperand, pc. 


3. Restrictions relating the lc register usage at the block-repeat 
loop are: 


3.1. The lc register must not be written during the block-repeat 
loop. | 


3.2. The lc register must not be used one instruction prior to the 
last instruction of the block-repeat loop. 


3.3.If£ the block-repeat loop is one instruction long, the lc reg- 
ister must not be used in this instruction. 


4. Notice that illegal instruction sequences are also restricted as 
the last and first instructions of a block-repeat loop. 


4.4.5 Branch/Call Instructions 
br Conditional Branch 
br address , {cond} 


Operation: If condition 
then address -> pce 


If the condition is met, branch to the program memory loca- 
tion specified by ‘address'. 


Affects flags: No 

Cycles: 2 

Words: 2 

[1] If the condition is met, ‘address' is the address/label of the new 


program memory location. The 'address' is the second word of the 
instruction. 





DSP Core Programmer’s Manual | 57 


Instruction Set Section 4 


brr Relative Conditional Branch 


brr Soffset address , {cond} 


Operation: If condition then 
‘the brr inst.' + Soffset address + 1 -> pc 


If the condition is met, a branch is executed to the fol- 
lowing program memory location: ‘the brr instruction' + 
‘offset address' + 1 


The offset range is -63 to 64. (Offset range is ‘offset 
address'+1) 

Affects flags: No 

Cycles: 2 


Words: 1 


[1] Assembler syntax: 
brr Soffset address, {cond} 
or 
brr label , {cond} 
Where 'label' is the new program memory location. The instruction 
word includes the 'offset address' calculated by the assembler as 


follows: 
(label address) - (brr address) - 1. 


call Conditional Call Subroutine 
call address , {cond} 
Operation: If condition 
then pec -> tos 
address -> pec 
Tf the condition is met, the program counter is pushed into 
the stack and a branch is performed to the program memory 
location specified by ‘address'. 
Affects flags: No 
Cycles: 2 
Words: 2 
[1] If the condition is met, '‘address' is the address/label of the new 


program memory location. The 'address' is the second word of the 
instruction. 
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calir Relative Conditional Call Subroutine 
callr Soffset address , {cond} 


Operation: If condition then 
pe -> tos 
‘the brr inst.' + Soffset address + 1 -> pc 


If the condition is met, the program counter is pushed 
into the stack and a branch is executed to the following 


program memory location: 
‘the callr instruction' + ‘offset address' + 1 


The offset range is -63 to 64. (Offset range is ‘offset 
address'+1). 


Affects flags: No 
Cycles: 2 
Words: 1 


[1] Assembler syntax: 
callr Soffset address , {cond} 


or 
callr label , {cond} , | 
Where 'label' is the new program memory location. The 
instruction word includes the ‘offset address' calculated by 


the assembler as follows: 
(label address) - (callr address) - 1. 


calla Call Subroutine at Location Specified by the Accumulator 


calla axXl 
Operation: pc -> tos 
(aX) -> pc 
Call subroutine indirect (address from aX). 


The program counter is pushed into the stack and a branch 
is executed to the address pointed by accumulator-low. 


This instruction can be used to perform computed subrou- 
tine calls. 


Affects flags: No 
Cycles: 2 


Words: ad 
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ret Return Conditionally 


ret {cond} 


Operation: 


Affects flags: 
Cycles: Z 


Words: 1 


If condition 
then tos -> pc 


If the condition is met, the program counter is pulled 
from the stack. The previous program counter is lost. 
This instruction is used to return from subroutines or 
interrupts. 


No 


[1] This instruction can also be used as return from interrupt (INTO or 
INT1), to enable more interrupts, the IE bit at st0O must be set 


-reti Return from Interrupt 


reti 


Operation: 


Affects flags: 
Cycles: 2 


Words: | 1 


tos -> pc 
1 -> IE E24 


The program counter is pulled from the system stack. The 
previous program counter is lost. The IE bit is set - 
enable interrupts. [1] This instruction is used for 
return from interrupt. 


No 


[1] This instruction is used for returning from interrupts. The trap_ 
and BPI interrupt service routines must be ended with reti instruc- 
tion. In these cases, the IE status will be the same as it was 

before entering the routine. 
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4.4.6 Control and Miscellaneous Instructions 


nop No Operation 

nop 

Operation: No operation 
Affects flags: No 

Sie: 1 


Words: 1 


modr Modify rN 


modr (rN) 
Operation: rN is modified. 


Affects flags: Z M N V C E 10 R 


R flag is set if the 16-bit rN register is zero; 


otherwise cleared. 
Cycles: ai 
Words: 1 


[1] This instruction can be used also for loop control. 


Example: modr (rQ)- 
brr add , NR 
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eint Enable Interrupt 
eint 


Operation: 1 -> IE 


IE bit is set - Enable interrupts. 
Affects flags: No 
Cycles: 1 


Words: 1 


dint Disable Interrupt 
dint 


Operation: 0 -> IE 


IE bit is cleared - Disable interrupts. 
Affects flags: No 
Cycles: Hd 


Words: 1 
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trap Software Interrupt 


trap 
Operation: pc -> tos 


QOOOAH -> pe 
Disable interrupts (INTO , INT1). 


Software interrupt. 


The program counter which points to the next instruction 
is pushed into the stack. A branch to address location 
QOOOAH is executed. 


The interrupts (INTO, INT1) are disabled regardless of 
the interrupt mask bits: IE, IMO, IM1 at sto. 


Affects flags: No 
Cycles: 2 


Words: il. 


{1] trap instruction cannot be used at: trap service routine, BPI ser- 
vice routine. 


[2] For returning from trap service routine use reti instruction. 


Ipg Load the Page Bits 
lpg #short immediate 


Operation: #short immediate -> page bits 


The page bits, the low-order 8 bits of sti, are loaded 
with an 8-bit constant (0 to 255). 


Affects flags: No 
Cycles: 1 


Words: 1 
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4.5 Instruction Execution 


4.5.1 Pipeline Method 


The program controller implements a three-level pipeline architecture. In the operation of the 
pipeline, concurrent fetch, operand fetch and execution occur. This allows instruction execution to 
overlap. Thus, the effective execution time for most instructions is one cycle. Each pipeline stage 
is completed before its result is needed by the next instruction. The pipeline is an "interlocking" 
pipeline, transparent to the user, which simplifies programming. 


The following chart shows the pipeline operation: 


| cyclel | cycle2 | cycle3 | cycle4 | cycle5 | 

| | | | | | 

fetch | <---n~--->|<--n+1-->|<--n+2-->| nae | | 
| | | | | | | 
op. fetch | ee |<---n--->|<--n+1-->]<--n+2-->| | 
| | | | | | 

execution | | as |<-~--n--->|<--n+1-->|<--n+2-->| 
| | 


| | | | 


Three instructions are executed for each cycle. For example in cycle 3, the fetch of instruction 
n+2, the operand fetch of instruction n+1 and the execution of instruction n are active. 
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5.1 Introduction 


This section describes the basic core clock interface. It includes descriptions of the core clock, the 
reset mode, the handling of interrupts and their priorities, the core signals and cycles. 


5.2 Clock 


The DSP core is driven by an off-core clock generator. 


DSP status bit STP (bit 13 of ST2) is routed to the core edge and can be used by the system clock 
generator to stop the clock and enter the STOP mode. 


5.3 Reset 


Reset is a non-maskable interrupt that can be used at any time to put the DSP core into a known 
state. Reset is typically applied after power up when the machine is in a non-deterministic state. It 
is also used to exit STOP mode. 


When a RESET is applied to the core, the processor enters the reset processing state, the processor 
terminates execution and forces the program counter to zero. Therefore, when the RESET signal 
is deactivated, execution starts from location 0O000H. Reset affects various registers and status 
bits. However when RESET is applied during STOP mode, the contents of the RAM and other reg- 
isters are unaffected. 


The following register bits are cleared during reset: 


STO bits 0+11, ST1 bits 10+11, ST2 bits 0+9, ST2 bits 13+12 
PC register (0:15) 


For more details about reset effects on status registers, see Section 3.7.2.2. 


The RESET signal (reset request to the core) must be active for at least 6 cycles. The fetch from 
address OOOOH is executed 1 cycle after RESET is deactivated. 
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5.4 Interrupts 


The DSP core has three interrupts: two maskable (INTO and INT1) interrupts and one break-point 
interrupt (BPI). It also has one software interrupt (TRAP). The hardware interrupts are high level- 
sensitive. 


Table 5-1 DSP Core Interrupts 


Memory Interrupt name & function 
location 


ooo [ese «id 
ones [nr enenatierimerps [sven 


* Start address for the interrupt/reset routine. 








Jumping to the interrupt service routine takes two cycles. The only exception to this is after a 
move instruction to the PC, which takes only one cycle. 


5.4.1 BPI, INTO, INT1 
Interrupts are accepted and serviced at the end of the current instruction execution. Interrupt ser- 
vicing will be delayed when one of the following cases occurs: 


1. Until the completion of all the cycles of a multicycle instruction including expansion of read/ 
write cycles due to wait states. 


2. Until the end of the REP instruction and the instruction being repeated. 
When the processor is in STOP mode. 

4. Inthe cycle after fetch of the following commands: DINT; mov, soperand, STO; movp (aX), 
STO. 


If more than one interrupt is pending and unmasked, the interrupt with the highest priority is 
accepted and serviced. 
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5.4.1.1 BPI - Breakpoint Interrupt 


This interrupt is an active high, non-maskable interrupt. When executing a BPI service routine, 
another BPI will not be accepted. 
When the BPI is accepted, DSP core performs the following: 


PC -> TOS 
O008H -> PC (interrupt starting address) 
[ACK pulse is generated 


The TRAP instruction cannot be used inside a BPI service routine. 
The BPI service routine must end with a RETI instruction. 


5.4.1.2 5.4.1.2 TRAP - Software Interrupt 


When executing a TRAP service routine, another TRAP cannot be used. Due to interrupt priorities 
(see above table) a BPI interrupt can be accepted inside a TRAP routine; INTO and INT1 are not 
accepted. 
When the TRAP is accepted, DSP core performs the following: 

PC -> TOS 

OOOAH -> PC (interrupt starting address) 


A TRAP service routine must end with a RETI instruction. 


5.4.1.3 INTO,INT1 - Maskable Interrupts 
Interrupts INTO,INT1 are active high, maskable interrupts. 


When an interrupt is accepted while the IE status bit is set and the individual interrupt is not 
masked (the corresponding IMx is set), DSP core performs the following: 


IE status bit cleared 

PC -> TOS 

OOOCH or QOOEH -> PC (interrupt starting address) 
IACK pulse is generated 

IMx is unaffected 


Return from an interrupt service routine by RETI or by RET. When using the RET instruction, the 
IE flag must be set in order to enable interrupts again. 
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Notes: 


1. A typical interrupt is activated by applying a high level to the INTO/INT1 input, thus setting 
the corresponding IPx bit. When the interrupt is acknowledged, the IE at the status register is 
disabled. If the interrupt signal at the input pin continues to be active and the IE is still dis- 
abled, no interrupts will be generated. If the interrupt signal level is removed before the IE is 
enabled, no further interrupts are generated. If the interrupt request continues to be active and 
the IE bit is subsequently set, then another interrupt will be generated after setting the IE. 


2. The PRIORITY between INTO/INT1 is significant only if more than one interrupt is received 
at the same time or when the IE is disabled for some time and both INTO and INT1 were 
received. In these cases, the interrupt will be acknowledged according to the interrupts priori- 
ties. | 
In case the processor is handling the INT1 service routine and INTO was received, the IPO bit 
will be set and the processor will enter the INTO service routine according to the status bits: IE, 
IMO. Similar handling will occur if the processor handles INTO service routine and INT1 was 


received. 
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